num_hidden_layer: 3
hidden_dim: 16
learning_rate: 0.001
num_epochs: 1000
l2_coeff: 0.0005
dropout_rate: 0.0
x_l1_coeff: 0.0005
x_ent_coeff: 0.001
edge_l1_coeff: 0.5
edge_ent_coeff: 0.1
